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<222> (1457) 
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t 



<400> 1 

ctgcagcctg 

gggccaagaa 

tcctgccccg 

tttctagaga 

ttatttgaac 

gctcaataaa 

gcccgggtac 

tgttccttgg 

gggggctcgt 

caagctggcc 
tgcgcctgcg 
ctgacgagtt 
gtttttgtgg 
tggttctggt 
cggtttggaa 
ctgactgtgt 
ttgaccttag 
aagaagagac 
ccgcgagacg 
cctggcccgc 
tttgaccccc 
ccatccgccc 



aatatgggcc 
cagatggaac 
gctcagggcc 
accatcagat 
taaccaatca 
agagcccaca 
ccgtgtatcc 
gagggtctcc 
ccgggatcgg 
agcaacttat 
tcggtactag 
ctgaacaccc 
cccgacctga 
aggagacgag 
ccgaagccgc 
ttctgtattt 
gtaactggaa 
gttgggttac 
gcacctttaa 
atggacaccc 
ctccctgggt 
cgtctctccc 



aaacaggata 
agctgaatat 
aagaacagat 
gtttccaggg 
gttcgcttct 
acccctcact 
aataaaccct 
tctgagtgat 
gagacccctg 
ctgtgtctgt 
ttagctaact 
ggccgcaacc 
ggaagggagt 
aacctaaaac 
gcgtcttgtc 
gtctgaaaat 
agatgtcgag 
cttctgctct 
ccgagacctc 
agaccaggtc 
caagcccttt 
ccttgaacct 



tctgtggtaa 
gggccaaaca 
ggtccccaga 
tgccccaagg 
cgcttctgtt 
cggggcgcca 
cttgcagttg 
tgactacccg 
cccagggacc 
ccgattgtct 
agctctgtat 
ctgggagacg 
cgatgtggaa 
agttcccgcc 
tgctgcagca 
tagggccaga 
cggctcgctc 
gcagaatggc 
atcacccagg 
ccctacatcg 
gtacacccta 
cctcgttcga 



gcagttcctg 
ggatatctgt 
tgcggtccag 
acctgaaatg 
cgcgcgcttc 
gtcctccgat 
catccgactt 
tcagcggggg 
accgacccac 
agtgtctatg 
ctggcggacc 
tcccagggac 
tccgaccccg 
tccgtctgaa 
tcgttctgtg 
ctgttaccac 
acaaccagtc 
caacctttaa 
ttaagatcaa 
tgacctggga 
agcctccgcc 
ccccgcctcg 



ccccggctca 
ggtaagcagt 
ccctcagcag 
accctgtgcc 
tgctccccga 
tgactgagtc 
gtggtctcgc 
tctttcattt 
caccgggagg 
actgatttta 
cgtggtggaa 
tttgggggcc 
tcaggatatg 
tttttgcttt 
ttgtctctgt 
tcccttaagt 
ggtagatgtc 
cgtcggatgg 
ggtcttttca 
agccttggct 
tcctcttcct 
atcctccctt 



60 

120 

180 

240 

300 

360 

420 

480 

540 

600 

660 

720 

780 

840 

900 

960 

1020 

1080 

1140 

1200 

1260 

1320 



tatccagccc 
atagggcgat 



tcactccttc 
tcgaatcagg 



tctaggcgcc 
ccttggcgcg 



ggccgctcta 
ccggatcctt 



gcccattaat 
aattaagcgc 



acgactcact 
aattgggagg 



1380 
1440 
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tggcggtagc ctcgag atg ggc gtg att acg gat tea ctg gcc gtc gtg gcc 14 92 

Met Gly Val He Thr Asp Ser Leu Ala Val Val Ala 
15 10 

cgc acc gat cgc cct tec eaa eag tta cgc age ctg aat gge gaa tgg 1540 
Arg Thr Asp Arg Pro Ser Gin Gin Leu Arg Ser Leu Asn Gly Glu Trp 
15 20 25 

cgc ttt gee tgg ttt ecg gca cca gaa gcg gtg ccg gaa age tgg ctg 1588 
Arg Phe Ala Trp Phe Pro Ala Pro Glu Ala Val Pro Glu Ser Trp Leu 
30 35 40 

gag tgc gat ctt cet gag gee gat act gtc gtc gtc cec tea aac tgg 1636 
Glu Cys Asp Leu Pro Glu Ala Asp Thr Val Val Val Pro Ser Asn Trp 
45 50 55 60 

cag atg cae ggt tac gat gcg cec ate tac acc aac gtg acc tat cec 1684 
Gin Met His Gly Tyr Asp Ala Pro He Tyr Thr Asn Val Thr Tyr Pro 
65 70 75 

att acg gtc aat ccg ccg ttt gtt cec acg gag aat ccg acg ggt tgt 1732 
He Thr Val Asn Pro Pro Phe Val Pro Thr Glu Asn Pro Thr Gly Cys 
80 85 90 

tac teg etc aca ttt aat gtt gat gaa age tgg eta eag gaa gge cag 1780 
Tyr Ser Leu Thr Phe Asn Val Asp Glu Ser Trp Leu Gin Glu Gly Gin 
95 100 105 

acg cga att att ttt gat ggc gtt aac teg gcg ttt eat ctg tgg tgc 1828 
Thr Arg He He Phe Asp Gly Val Asn Ser Ala Phe His Leu Trp Cys 
110 115 120 

aac ggg cgc tgg gtc ggt tac ggc cag gae agt egt ttg ccg tct gaa 1876 
Asn Gly Arg Trp Val Gly Tyr Gly Gin Asp Ser Arg Leu Pro Ser Glu 
125 130 135 140 

ttt gae ctg age gca ttt tta cgc gcc gga gaa aac cgc etc gcg gtg 1924 
Phe Asp Leu Ser Ala Phe Leu Arg Ala Gly Glu Asn Arg Leu Ala Val 
145 150 155 

atg gtg ctg cgc tgg agt gae gge agt tat ctg gaa gat cag gat atg 1972 
Met Val Leu Arg Trp Ser Asp Gly Ser Tyr Leu Glu Asp Gin Asp Met 
160 165 170 

tgg egg atg age gge att ttc egt gae gtc teg ttg ctg eat aaa ccg 2020 
Trp Arg Met Ser Gly He Phe Arg Asp Val Ser Leu Leu His Lys Pro 
175 180 185 

act aca eaa ate age gat ttc cat gtt gee act cgc ttt aat gat gat 2068 
Thr Thr Gin He Ser Asp Phe His Val Ala Thr Arg Phe Asn Asp Asp 
190 195 200 

ttc age cgc get gta ctg gag get gaa gtt eag atg tgc ggc gag ttg 2116 
Phe Ser Arg Ala Val Leu Glu Ala Glu Val Gin Met Cys Gly Glu Leu 
205 210 215 220 



egt gae tac eta egg gta aca gtt tct tta tgg cag ggt gaa acg cag 2164 
Arg Asp Tyr Leu Arg Val Thr Val Ser Leu Trp Gin Gly Glu Thr Gin 
225 230 235 
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gtc gcc age 
Val Ala Ser 



ggt ggt tat 
Gly Gly Tyr 
255 

aaa ctg tgg 
Lys Leu Trp 
270 

ctg cac acc 
Leu His Thr 
285 

ggt ttc cgc 
Gly Phe Arg 



aag ccg ttg 
Lys Pro Leu 



cat ggt cag 
His Gly Gin 
335 

atg aag cag 
Met Lys Gin 
350 

cat ccg ctg 
His Pro Leu 
365 

gat gaa gcc 
Asp Glu Ala 



acc gat gat 
Thr Asp Asp 



atg gtg cag 
Met Val Gin 
415 

ggg aat gaa 
Gly Asn Glu 
430 

ate aaa tct 
lie Lys Ser 
445 



ggc acc gcg 
Gly Thr Ala 
240 

gcc gat cgc 
Ala Asp Arg 



age gcc gaa 
Ser Ala Glu 



gcc gac ggc 
Ala Asp Gly 
290 

gag gtg egg 
Glu Val Arg 
305 

ctg att cga 
Leu lie Arg 
320 

gtc atg gat 
Val Met Asp 



aac aac ttt 
Asn Asn Phe 



tgg tac acg 
Trp Tyr Thr 
370 

aat att gaa 
Asn lie Glu 
385 

ccg cgc tgg 
Pro Arg Trp 
400 

cgc gat cgt 
Arg Asp Arg 



tea ggc cac 
Ser Gly His 



gtc gat cet 
Val Asp Pro 
450 



cet ttc ggc 
Pro Phe Gly 
245 

gtc aca eta 
Val Thr Leu 
260 

ate ccg aat 
lie Pro Asn 
275 

acg ctg att 
Thr Leu He 



att gaa aat 
He Glu Asn 



ggc gtt aac 
Gly Val Asn 
325 

gag cag acg 
Glu Gin Thr 
340 

aac gcc gtg 
Asn Ala Val 
355 

ctg tge gac 
Leu Cys Asp 



acc cac ggc 
Thr His Gly 



eta ccg gcg 
Leu Pro Ala 
405 

aat cac ccg 
Asn His Pro 
420 

ggc get aat 
Gly Ala Asn 
435 

tec cgc ccg 
Ser Arg Pro 



ggt gaa att 
Gly Glu lie 



cgt ctg aac 
Arg Leu Asn 



etc tat cgt 
Leu Tyr Arg 
280 

gaa gea gaa 
Glu Ala Glu 
295 

ggt ctg ctg 
Gly Leu Leu 
310 

cgt cac gag 
Arg His Glu 



atg gtg cag 
Met Val Gin 



cgc tgt teg 
Arg Cys Ser 
360 

cgc tac ggc 
Arg Tyr Gly 
375 

atg gtg cca 
Met Val Pro 
390 

atg age gaa 
Met Ser Glu 



agt gtg ate 
Ser Val He 



cac gac gcg 
His Asp Ala 
440 

gtg cag tat 
Val Gin Tyr 
455 



ate gat gag 
He Asp Glu 
250 

gtc gaa aac 
Val Glu Asn 
265 

gcg gtg gtt 
Ala Val Val 



gcc tgc gat 
Ala Cys Asp 



ctg ctg aac 
Leu Leu Asn 
315 

cat cat cet 
His His Pro 
330 

gat ate ctg 
Asp He Leu 
345 

cat tat ccg 
His Tyr Pro 



ctg tat gtg 
Leu Tyr Val 



atg aat cgt 
Met Asn Arg 
395 

cgc gta acg 
Arg Val Thr 
410 

ate tgg teg 
He Trp Ser 
425 

ctg tat cgc 
Leu Tyr Arg 



gaa ggc ggc 
Glu Gly Gly 



cgt 2212 
Arg 



ccg 2260 
Pro 



gaa 2308 
Glu 



gtc 2356 

Val 

300 

ggc 2404 
Gly 



ctg 2452 
Leu 



ctg 2500 
Leu 



aac 2548 
Asn 



gtg 2596 

Val 

380 

ctg 2644 
Leu 



cga 2692 
Arg 



ctg 2740 
Leu 



tgg 2788 
Trp 



gga 2836 

Gly 

4 60 



gcc gac ace acg gcc ace gat att att tge ccg atg tac gcg cgc gtg 2884 
Ala Asp Thr Thr Ala Thr Asp He He Cys Pro Met Tyr Ala Arg Val 
465 470 475 
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gat gaa gac cag ccc ttc ccg get gtg ccg aaa tgg tec ate aaa aaa 2932 
Asp Glu Asp Gin Pro Phe Pro Ala Val Pro Lys Trp Ser lie Lys Lys 
480 485 490 

tgg ctt teg eta eet gga gag aeg cgc ccg ctg ate ett tgc gaa tac 2980 
Trp Leu Ser Leu Pro Gly Glu Thr Arg Pro Leu lie Leu Cys Glu Tyr 
495 • 500 505 

gee eac gcg atg ggt aae agt ett ggc ggt ttc get aaa tac tgg eag 3028 
Ala His Ala Met Gly Asn Ser Leu Gly Gly Phe Ala Lys Tyr Trp Gin 
510 515 520 

gcg ttt cgt eag tat ccc egt tta eag gge ggc ttc gtc tgg gae tgg 3076 
Ala Phe Arg Gin Tyr Pro Arg Leu Gin Gly Gly Phe Val Trp Asp Trp 
525 530 535 540 

gtg gat eag teg ctg att aaa tat gat gaa aae ggc aac ccg tgg teg 3124 
Val Asp Gin Ser Leu lie Lys Tyr Asp Glu Asn Gly Asn Pro Trp Ser 
545 550 555 

get tae ggc ggt gat ttt gge gat aeg ccg aac gat cgc cag ttc tgt 3172 
Ala Tyr Gly Gly Asp Phe Gly Asp Thr Pro Asn Asp Arg Gin Phe Cys 
560 565 570 

atg aae ggt ctg gtc ttt gee gac cgc aeg eeg eat cca gcg ctg aeg 3220 
Met Asn Gly Leu Val Phe Ala Asp Arg Thr Pro His Pro Ala Leu Thr 
575 580 585 

gaa gca aaa eac cag eag eag ttt ttc eag ttc egt tta tec ggg caa 3268 
Glu Ala Lys His Gin Gin Gin Phe Phe Gin Phe Arg Leu Ser Gly Gin 
590 595 600 

ace ate gaa gtg acc age gaa tae ctg ttc egt eat age gat aae gag 3316 
Thr lie Glu Val Thr Ser Glu Tyr Leu Phe Arg His Ser Asp Asn Glu 
605 610 615 620 

etc etg eae tgg atg gtg gcg ctg gat ggt aag ccg ctg gca age ggt 3364 
Leu Leu His Trp Met Val Ala Leu Asp Gly Lys Pro Leu Ala Ser Gly 
625 630 635 

gaa gtg eet etg gat gtc get eea caa ggt aaa cag ttg att gaa ctg 3412 
Glu Val Pro Leu Asp Val Ala Pro Gin Gly Lys Gin Leu lie Glu Leu 
640 645 650 

eet gaa eta ccg eag ccg gag age gee ggg caa etc tgg etc aea gta 3460 
Pro Glu Leu Pro Gin Pro Glu Ser Ala Gly Gin Leu Trp Leu Thr Val 
655 660 665 

cgc gta gtg caa ccg aac gcg acc gca tgg tea gaa gee ggg eac ate 3508 
Arg Val Val Gin Pro Asn Ala Thr Ala Trp Ser Glu Ala Gly His lie 
670 675 680 

age gee tgg eag eag tgg egt etg gcg gaa aac etc agt gtg aeg etc 3556 
Ser Ala Trp Gin Gin Trp Arg Leu Ala Glu Asn Leu Ser Val Thr Leu 
685 690 695 700 



ccc gee gcg tec eac gee ate ccg cat etg ace acc age gaa atg gat 3604 
Pro Ala Ala Ser His Ala lie Pro His Leu Thr Thr Ser Glu Met Asp 
705 710 715 
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ttt tgc ate 
Phe Cys lie 



ggc ttt ctt 
Gly Phe Leu 
735 

ccg ctg cgc 
Pro Leu Arg 
750 

gta agt gaa 
Val Ser Glu 
765 

aag gcg gcg 
Lys Ala Ala 



gca gat aca 
Ala Asp Thr 



cag cat cag 
Gin His Gin 
815 

gat ggt agt 
Asp Gly Ser 
830 

gat aca ccg 
Asp Thr Pro 
845 

gta gca gag 
Val Ala Glu 



ccc gac cgc 
Pro Asp Arg 



tea gac atg 
Ser Asp Met 
895 

tgc ggg acg 
Cys Gly Thr 
910 

ttc cag ttc 
Phe Gin Phe 
925 



gag ctg ggt 
Glu Leu Gly 
720 

tea cag atg 
Ser Gin Met 



gat cag ttc 
Asp Gin Phe 



gcg ace cgc 
Ala Thr Arg 
770 

ggc cat tac 
Gly His Tyr 
785 

ctt get gat 
Leu Ala Asp 
800 

ggg aaa acc 
Gly Lys Thr 



ggt caa atg 
Gly Gin Met 



cat ccg gcg 
His Pro Ala 
850 

egg gta aae 
Arg Val Asn 
865 

ctt act gee 
Leu Thr Ala 
880 

tat ace ccg 
Tyr Thr Pro 



cgc gaa ttg 
Arg Glu Leu 



aae ate age 
Asn lie Ser 
930 



aat aag cgt 
Asn Lys Arg 
725 

tgg att ggc 
Trp lie Gly 
740 

acc cgt gca 
Thr Arg Ala 
755 

att gac cet 
lie Asp Pro 



cag gee gaa 
Gin Ala Glu 



gcg gtg ctg 
Ala Val Leu 
805 

tta ttt ate 
Leu Phe lie 
820 

gcg att acc 
Ala He Thr 
835 

egg att ggc 
Arg He Gly 



tgg etc gga 
Trp Leu Gly 



gee tgt ttt 
Ala Cys Phe 
885 

tac gte ttc 
Tyr Val Phe 
900 

aat tat ggc 
Asn Tyr Gly 
915 

cgc tac agt 
Arg Tyr Ser 



tgg caa ttt 
Trp Gin Phe 



gat aaa aaa 
Asp Lys Lys 



ccg ctg gat 
Pro Leu Asp 
760 

aae gee tgg 
Asn Ala Trp 
775 

gca gcg ttg 
Ala Ala Leu 
790 

att acg ace 
He Thr Thr 



age egg aaa 
Ser Arg Lys 



gtt gat gtt 
Val Asp Val 
840 

ctg aae tgc 
Leu Asn Cys 
855 

tta ggg ccg 
Leu Gly Pro 
870 

gac cgc tgg 
Asp Arg Trp 



ccg age gaa 
Pro Ser Glu 



cca cac cag 
Pro His Gin 
920 

caa cag caa 
Gin Gin Gin 
935 



aae cgc cag 
Asn Arg Gin 
730 

caa ctg ctg 
Gin Leu Leu 
745 

aae gac att 
Asn Asp He 



gte gaa ege 
Val Glu Arg 



ttg cag tgc 
Leu Gin Cys 
795 

get cac gcg 
Ala His Ala 
810 

acc tac egg 
Thr Tyr Arg 
825 

gaa gtg gcg 
Glu Val Ala 



cag ctg gcg 
Gin Leu Ala 



caa gaa aae 
Gin Glu Asn 
875 

gat ctg cca 
Asp Leu Pro 
890 

aae ggt ctg 
Asn Gly Leu 
905 

tgg cgc ggc 
Trp Arg Gly 



ctg atg gaa 
Leu Met Glu 



tea 3652 
Ser 



acg 3700 
Thr 



ggc 3748 
Gly 



tgg 3796 

Trp 

780 

acg 3844 
Thr 



tgg 3892 
Trp 



att 3940 
He 



age 3988 
Ser 



cag 4036 

Gin 

860 

tat 4084 
Tyr 



ttg 4132 
Leu 



cgc 4180 
Arg 



gac 4228 
Asp 



ace 4276 

Thr 

940 



age cat cgc cat ctg ctg cac gcg gaa gaa ggc aca tgg ctg aat ate 4324 
Ser His Arg His Leu Leu His Ala Glu Glu Gly Thr Trp Leu Asn He 
945 950 955 
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gac ggt ttc cat atg ggg att ggt ggc gac gac tec tgg age ccg tea 
Asp Gly Phe His Met Gly lie Gly Gly Asp Asp Ser Trp Ser Pro Ser 
960 965 970 



4372 



gta teg gcg gaa ttc cag etg age gee ggt cgc tac cat tac cag ttg 
Val Ser Ala Glu Phe Gin Leu Ser Ala Gly Arg Tyr His Tyr Gin Leu 
975 980 985 



4420 



gtc tgg tgt caa aaa aga tct gac tat aaa gat gag gac etc gac eat 
Val Trp Cys Gin Lys Arg Ser Asp Tyr Lys Asp Glu Asp Leu Asp His 
990 995 1000 



44 68 



cat cat cat eat cac egg taataatagg tagataagtg actgattaga 
His His His His His Arg 
1005 1010 



4516 



tgcattgatc 
tgagggcceg 
tegeeaaagg 
cttgaagaca 
acaggtgcct 
cccagtgcca 
tattcaaeaa 
ggcctcggtg 
gaaccaeggg 
atggattgca 
cacaacagae 
cggttctttt 
cgeggctatc 
ctgaageggg 
ctcaccttgc 
cgcttgatcc 
gtactcggat 
tcgegceage 
tegtgaccca 
gattcatcga 
cccgtgatat 
gtatcgccgc 
gagegggact 
ggggggaatg 
caaggcatgg 
tggaacaget 
agggceaaga 
ttcctgcccc 
gtttctagag 
ettatttgaa 
agctcaataa 
cgcccgggta 
ctgttccttg 
catgcageat 
atagttgcat 
tccgcttcct 
getcacteaa 



cetcgaccaa 
gaaaeetgge 
aatgeaaggt 
aacaacgtct 
ctgcggccaa 
cgttgtgagt 
ggggctgaag 
cacatgcttt 
gaegtggttt 
cgeaggttct 
aatcggctge 
tgtcaagacc 
gtggctggcc 
aagggactgg 
tcctgccgag 
ggctacctgc 
ggaagccggt 
cgaaetgtte 
tggcgatgcc 
ctgtggcegg 
tgctgaagag 
tecegatteg 
etggggttcg 
aaagacccca 
aaaaatacat 
gaatatgggc 
aeagatggaa 
ggctcagggc 
aaccateaga 
etaaccaatc 
aagagcecae 
cccgtgtatc 
ggagggtcte 
gtatcaaaat 
taatgaateg 
egctcactga 
aggeggtaat 



ttccggttat 
ectgtettct 
etgttgaatg 
gtagegacce 
aagccacgtg 
tggatagttg 
gatgcccaga 
aeatgtgttt 
tcetttgaaa 
ceggccgett 
tetgatgccg 
gacctgtceg 
aegaegggcg 
ctgctattgg 
aaagtateca 
ccattcgace 
cttgtcgatc 
geeaggctea 
tgcttgccga 
etgggtgtgg 
ettggcggcg 
cagegcateg 
catcgataaa 
cctgtaggtt 
aactgagaat 
caaaeaggat 
eagctgaata 
eaagaacaga 
tgtttecagg 
agttcgcttc 
aacccctcac 
caataaacce 
ctctgagtga 
taatttggtt 
geeaacgege 
ctegctgcgc 
aegg 



tttccaccat 
tgacgagcat 
tegtgaagga 
tttgcaggca 
tataagatac 
tggaaagagt 
aggtacccca 
agtcgaggtt 
aacacgatga 
gggtggagag 
ccgtgttccg 
gtgccctgaa 
ttccttgccg 
gcgaagtgce 
teatggctga 
accaagegaa 
aggatgatct 
aggcgcgcat 
atatcatggt 
eggacegcta 
aatgggctga 
ccttctatcg 
ataaaagatt 
tggeaagcta 
agagaagttc 
atetgtggta 
tgggecaaac 
tggtccccag 
gtgccccaag 
tcgcttctgt 
teggggegee 
tettgeagtt 
ttgactaccc 
ttttttetta 
ggggagaggc 
tcggtcgttc 



attgeegtct 
tectaggggt 
ageagttcet 
gcggaaccec 
acctgcaaag 
caaatggetc 
ttgtatggga 
aaaaaaegte 
taataccatg 
getattegce 
getgtcagcg 
tgaaetgcag 
agctgtgctc 
ggggeaggat 
tgcaatgegg 
acatcgcatc 
ggacgaagag 
gcccgacggc 
ggaaaatggc 
tcaggacata 
ccgcttcctc 
ccttcttgae 
ttatttagtc 
gcttaagtaa 
agateaaggt 
ageagttcet 
aggatatetg 
atgcggtcea 
gacctgaaat 
tcgcgcgett 
agtcctccga 
geatccgact 
gtcagcgggg 
agtatttaca 
ggtttgcgta 
ggctgcggcg 



tttggcaatg 
ctttccccte 
ctggaagctt 
ceaeetggeg 
gcggcacaae 
teeteaagcg 
tetgatctgg 
taggeecccc 
attgaacaag 
tatgactggg 
caggggegee 
gaegaggcag 
gacgttgtca 
ctcctgteat 
eggctgeata 
gagegageae 
catcaggggc 
gaggatcteg 
cgcttttctg 
gegttggeta 
gtgctttacg 
gagttcttet 
tecagaaaaa 
cgecattttg 
caggaacaga 
gccccggctc 
tggtaagcag 
gecctcagea 
gaccctgtgc 
etgcteeccg 
ttgactgagt 
tgtggtctcg 
gtcttteatt 
ttaaatggce 
ttggcgctet 
ageggtatca 



4576 
4636 
4696 
4756 
4816 
4876 
4936 
4996 
5056 
5116 
5176 
5236 
5296 
5356 
5416 
5476 
5536 
5596 
5656 
5716 
5776 
5836 
5896 
5956 
6016 
6076 
6136 
6196 
6256 
6316 
6376 
6436 
6496 
6556 
6616 
6676 
6700 



<210> 2 

<211> 1010 

<212> PRT 

<213> Artificial Sequence 
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r 



<220> 

<223> Amino acid sequence for pICAST ALC 
<400> 2 

Met Gly Val lie Thr Asp Ser Leu Ala Val Val Ala Arg Thr Asp Arg 

15 10 15 

Pro Ser Gin Gin Leu Arg Ser Leu Asn Gly Glu Trp Arg Phe Ala Trp 

20 25 30 

Phe Pro Ala Pro Glu Ala Val Pro Glu Ser Trp Leu Glu Cys Asp Leu 

35 40 45 

Pro Glu Ala Asp Thr Val Val Val Pro Ser Asn Trp Gin Met His Gly 

50 55 60 

Tyr Asp Ala Pro lie Tyr Thr Asn Val Thr Tyr Pro lie Thr Val Asn 
65 70 75 80 

Pro Pro Phe Val Pro Thr Glu Asn Pro Thr Gly Cys Tyr Ser Leu Thr 

85 90 95 

Phe Asn Val Asp Glu Ser Trp Leu Gin Glu Gly Gin Thr Arg lie lie 

100 105 110 

Phe Asp Gly Val Asn Ser Ala Phe His Leu Trp Cys Asn Gly Arg Trp 

115 120 125 

Val Gly Tyr Gly Gin Asp Ser Arg Leu Pro Ser Glu Phe Asp Leu Ser 

130 135 140 

Ala Phe Leu Arg Ala Gly Glu Asn Arg Leu Ala Val Met Val Leu Arg 
145 150 155 160 

Trp Ser Asp Gly Ser Tyr Leu Glu Asp Gin Asp Met Trp Arg Met Ser 

165 170 175 

Gly lie Phe Arg Asp Val Ser Leu Leu His Lys Pro Thr Thr Gin lie 

180 185 190 

Ser Asp Phe His Val Ala Thr Arg Phe Asn Asp Asp Phe Ser Arg Ala 

195 200 205 

Val Leu Glu Ala Glu Val Gin Met Cys Gly Glu Leu Arg Asp Tyr Leu 

210 215 220 

Arg Val Thr Val Ser Leu Trp Gin Gly Glu Thr Gin Val Ala Ser Gly 
225 230 235 240 

Thr Ala Pro Phe Gly Gly Glu lie lie Asp Glu Arg Gly Gly Tyr Ala 

245 250 255 

Asp Arg Val Thr Leu Arg Leu Asn Val Glu Asn Pro Lys Leu Trp Ser 

260 265 270 

Ala Glu lie Pro Asn Leu Tyr Arg Ala Val Val Glu Leu His Thr Ala 

275 280 285 

Asp Gly Thr Leu lie Glu Ala Glu Ala Cys Asp Val Gly Phe Arg Glu 

290 295 300 

Val Arg lie Glu Asn Gly Leu Leu Leu Leu Asn Gly Lys Pro Leu Leu 
305 310 315 320 

lie Arg Gly Val Asn Arg His Glu His His Pro Leu His Gly Gin Val 

325 330 335 

Met Asp Glu Gin Thr Met Val Gin Asp lie Leu Leu Met Lys Gin Asn 

340 345 350 

Asn Phe Asn Ala Val Arg Cys Ser His Tyr Pro Asn His Pro Leu Trp 

355 360 365 

Tyr Thr Leu Cys Asp Arg Tyr Gly Leu Tyr Val Val Asp Glu Ala Asn 

370 375 380 

lie Glu Thr His Gly Met Val Pro Met Asn Arg Leu Thr Asp Asp Pro 
385 390 395 400 

Arg Trp Leu Pro Ala Met Ser Glu Arg Val Thr Arg Met Val Gin Arg 
405 410 415 



Asp Arg Asn His Pro Ser Val lie lie Trp i^er i^eu uiy Asn (^lu ber 

420 425 430 

Gly His Gly Ala Asn His Asp Ala Leu Tyr Arg Trp lie Lys Ser Val 

435 440 445 

Asp Pro Ser Arg Pro Val Gin Tyr Glu Gly Gly Gly Ala Asp Thr Thr 
450 455 460 
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Ala 


Thr 


Asp 


He 


He 


Cys 


Pro 


Met 


Tyr 


Ala 


Arg 


Val 


Asp 


Glu 


Asp 


Gin 


465 










470 










475 










480 


Pro 


Phe 


Pro 


Ala 


Val 


Pro 


Lys 


Trp 


Ser 


He 


Lys 


Lys 


Trp 


Leu 


Ser 


Leu 










485 










490 










495 




Pro 


Gly 


Glu 


Thr 


Arg 


Pro 


Leu 


He 


Leu 


Cys 


Glu 


Tyr 


Ala 


His 


Ala 


Met 








500 










505 










510 






Gly 


Asn 


Ser 


Leu 


Gly 


Gly 


Phe 


Ala 


Lys 


Tyr 


Trp 


Gin 


Ala 


Phe 


Arg 


Gin 






515 










520 










525 








Tyr 


Pro 


Arg 


Leu 


Gin 


Gly 


Gly 


Phe 


Val 


Trp 


Asp 


Trp 


Val 


Asp 


Gin 


Ser 




530 










535 










540 










Leu 


He 


Lys 


Tyr 


Asp 


Glu 


Asn 


Gly 


Asn 


Pro 


Trp 


Ser 


Ala 


Tyr 


Gly 


Gly 


545 










550 










555 










560 


Asp 


Phe 


Gly 


Asp 


Thr 


Pro 


Asn 


Asp 


Arg 


Gin 


Phe 


Cys 


Met 


Asn 


Gly 


Leu 










565 










570 










575 




Val 


Phe 


Ala 


Asp 


Arg 


Thr 


Pro 


His 


Pro 


Ala 


Leu 


Thr 


Glu 


Ala 


Lys 


His 








580 










585 










590 






Gin 


Gin 


Gin 


Phe 


Phe 


Gin 


Phe 


Arg 


Leu 


Ser 


Gly 


Gin 


Thr 


He 


Glu 


Val 






595 










600 










605 








Thr 


Ser 


Glu 


Tyr 


Leu 


Phe 


Arg 


His 


Ser 


Asp 


Asn 


Glu 


Leu 


Leu 


His 


Trp 




610 










615 










620 










Met 


Val 


Ala 


Leu 


Asp 


Gly 


Lys 


Pro 


Leu 


Ala 


Ser 


Gly 


Glu 


Val 


Pro 


Leu 


625 










630 










635 










640 


Asp 


Val 


Ala 


Pro 


Gin 


Gly 


Lys 


Gin 


Leu 


He 


Glu 


Leu 


Pro 


Glu 


Leu 


Pro 










645 










650 










655 




Gin 


Pro 


Glu 


Ser 


Ala 


Gly 


Gin 


Leu 


Trp 


Leu 


Thr 


Val 


Arg 


Val 


Val 


Gin 








660 










665 










670 






Pro 


Asn 


Ala 


Thr 


Ala 


Trp 


Ser 


Glu 


Ala 


Gly 


His 


He 


Ser 


Ala 


Trp 


Gin 






675 










680 










685 








Gin 


Trp 


Arg 


Leu 


Ala 


Glu 


Asn 


Leu 


Ser 


Val 


Thr 


Leu 


Pro 


Ala 


Ala 


Ser 




690 










695 










700 










His 


Ala 


He 


Pro 


His 


Leu 


Thr 


Thr 


Ser 


Glu 


Met 


Asp 


Phe 


Cys 


He 


Glu 


705 










710 










715 










720 


Leu 


Gly 


Asn 


Lys 


Arg 


Trp 


Gin 


Phe 


Asn 


Arg 


Gin 


Ser 


Gly 


Phe 


Leu 


Ser 










725 










730 










735 




Gin 


Met 


Trp 


He 


Gly 


Asp 


Lys 


Lys 


Gin 


Leu 


Leu 


Thr 


Pro 


Leu 


Arg 


Asp 








740 










745 










750 






Gin 


Phe 


Thr 


Arg 


Ala 


Pro 


Leu 


Asp 


Asn 


Asp 


He 


Gly 


Val 


Ser 


Glu 


Ala 






755 










760 










765 








Thr 


Arg 


He 


Asp 


Pro 


Asn 


Ala 


Trp 


Val 


Glu 


Arg 


Trp 


Lys 


Ala 


Ala 


Gly 




770 










775 










780 










His 


Tyr 


Gin 


Ala 


Glu 


Ala 


Ala 


Leu 


Leu 


Gin 


Cys 


Thr 


Ala 


Asp 


Thr 


Leu 


785 










790 










795 










800 


Ala 


Asp 


Ala 


Val 


Leu 


He 


Thr 


Thr 


Ala 


His 


Ala 


Trp 


Gin 


His 


Gin 


Gly 










805 










810 










815 




Lys 


Thr 


Leu 


Phe 


He 


Ser 


Arg 


Lys 


Thr 


Tyr 


Arg 


He 


Asp 


Gly 


Ser 


Gly 








820 










825 










830 






Gin 


Met 


Ala 


He 


Thr 


Val 


Asp 


Val 


Glu 


Val 


Ala 


Ser 


Asp 


Thr 


Pro 


His 






835 










840 










845 








Pro 


Ala 


Arg 


He 


Gly 


Leu 


Asn 


Cys 


Gin 


Leu 


Ala 


Gin 


Val 


Ala 


Glu 


Arg 




850 










855 










860 










Val 


Asn 


Trp 


Leu 


Gly 


Leu 


Gly 


Pro 


Gin 


Glu 


Asn 


Tyr 


Pro 


Asp 


Arg 


Leu 


865 










870 










875 










880 


Thr 


Ala 


Ala 


Cys 


Phe 


Asp 


Arg 


Trp 


Asp 


Leu 


Pro 


Leu 


Ser 


Asp 


Met 


Tyr 










885 










890 










895 




Thr 


Pro 


Tyr 


Val 


Phe 


Pro 


Ser 


Glu 


Asn 


Gly 


Leu 


Arg 


Cvs 


Gly 


Thr 


Arg 








900 










905 










910 






Glu 


Leu 


Asn 


Tyr 


Gly 


Pro 


His 


Gin 


Trp 


Arg 


Gly 


Asp 


Phe 


Gin 


Phe 


Asn 






915 










920 










925 








He 


Ser 


Arg 


Tyr 


Ser 


Gin 


Gin 


Gin 


Leu 


Met 


Glu 


Thr 


Ser 


His 


Arg 


His 




930 










935 










940 










Leu 


Leu 


His 


Ala 


Glu 


Glu 


Gly 


Thr 


Trp 


Leu 


Asn 


He 


Asp 


Gly 


Phe 


His 


945 










950 










955 










960 
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Met Gly lie Gly Gly Asp Asp Ser Trp Ser Pro Ser Val Ser Ala Glu 

965 970 975 

Phe Gin Leu Ser Ala Gly Arg Tyr His Tyr Gin Leu Val Trp Cys Gin 

980 985 990 

Lys Arg Ser Asp Tyr Lys Asp Glu Asp Leu Asp His His His His His 
995 1000 1005 

His Arg 
1010 



<210> 3 
<211> 8518 
<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Nucleotide sequence for pICAST ALN 
<400> 3 

ctgcagcctg aatatgggcc aaacaggata tctgtggtaa gcagttcctg ccccggctca 60 

gggccaagaa cagatggaac agctgaatat gggccaaaca ggatatctgt ggtaagcagt 120 

tcctgccccg gctcagggcc aagaacagat ggtccccaga tgcggtccag ccctcagcag 180 

tttctagaga accatcagat gtttccaggg tgccccaagg acctgaaatg accctgtgcc 240 

ttatttgaac taaccaatca gttcgcttct cgcttctgtt cgcgcgcttc tgctccccga 300 

gctcaataaa agagcccaca acccctcact cggggcgcca gtcctccgat tgactgagtc 360 

gcccgggtac ccgtgtatcc aataaaccct cttgcagttg catccgactt gtggtctcgc 420 

tgttccttgg gagggtctcc tctgagtgat tgactacccg tcagcggggg tctttcattt 480 

gggggctcgt ccgggatcgg gagacccctg cccagggacc accgacccac caccgggagg 540 

caagctggcc agcaacttat ctgtgtctgt ccgattgtct agtgtctatg actgatttta 600 

tgcgcctgcg tcggtactag ttagctaact agctctgtat ctggcggacc cgtggtggaa 660 

ctgacgagtt ctgaacaccc ggccgcaacc ctgggagacg tcccagggac tttgggggcc 720 

gtttttgtgg cccgacctga ggaagggagt cgatgtggaa tccgaccccg tcaggatatg 780 

tggttctggt aggagacgag aacctaaaac agttcccgcc tccgtctgaa tttttgcttt 840 

cggtttggaa ccgaagccgc gcgtcttgtc tgctgcagca tcgttctgtg ttgtctctgt 900 

ctgactgtgt ttctgtattt gtctgaaaat tagggccaga ctgttaccac tcccttaagt 960 

ttgaccttag gtaactggaa agatgtcgag cggctcgctc acaaccagtc ggtagatgtc 1020 

aagaagagac gttgggttac cttctgctct gcagaatggc caacctttaa cgtcggatgg 1080 

ccgcgagacg gcacctttaa ccgagacctc atcacccagg ttaagatcaa ggtcttttca 1140 

cctggcccgc atggacaccc agaccaggtc ccctacatcg tgacctggga agccttggct 1200 

tttgaccccc ctccctgggt caagcccttt gtacacccta agcctccgcc tcctcttcct 1260 

ccatccgccc cgtctctccc ccttgaacct cctcgttcga ccccgcctcg atcctccctt 1320 

tatccagccc tcactccttc tctaggcgcc ggccgctcta gcccattaat acgactcact 1380 

atagggcgat tcgaacacca tgcaccatca tcatcatcac gtcgactata aagatgagga 1440 

cctcgagatg ggcgtgatta cggattcact ggccgtcgtg gcccgcaccg atcgcccttc 1500 

ccaacagtta cgcagcctga atggcgaatg gcgctttgcc tggtttccgg caccagaagc 1560 

ggtgccggaa agctggctgg agtgcgatct tcctgaggcc gatactgtcg tcgtcccctc 1620 

aaactggcag atgcacggtt acgatgcgcc catctacacc aacgtgacct atcccattac 1680 

ggtcaatccg ccgtttgttc ccacggagaa tccgacgggt tgttactcgc tcacatttaa 1740 

tgttgatgaa agctggctac aggaaggcca gacgcgaatt atttttgatg gcgttaactc 1800 

ggcgtttcat ctgtggtgca acgggcgctg ggtcggttac ggccaggaca gtcgtttgcc 1860 

gtctgaattt gacctgagcg catttttacg cgccggagaa aaccgcctcg cggtgatggt 1920 

gctgcgctgg agtgacggca gttatctgga agatcaggat atgtggcgga tgagcggcat 1980 

tttccgtgac gtctcgttgc tgcataaacc gactacacaa atcagcgatt tccatgttgc 2040 

cactcgcttt aatgatgatt tcagccgcgc tgtactggag gctgaagttc agatgtgcgg 2100 

cgagttgcgt gactacctac gggtaacagt ttctttatgg cagggtgaaa cgcaggtcgc 2160 

cag c ggcacc qcqcctttcq qcggtcraaat tatcqatqaq cqtqqtggtt atgccgatcg 2220 



cgtcacacta cgtctgaacg tcgaaaaccc gaaactgtgg agcgccgaaa tcccgaatct 2280 

ctatcgtgcg gtggttgaac tgcacaccgc cgacggcacg ctgattgaag cagaagcctg 2340 

cgatgtcggt ttccgcgagg tgcggattga aaatggtctg ctgctgctga acggcaagcc 2400 

gttgctgatt cgaggcgtta accgtcacga gcatcatcct ctgcatggtc aggtcatgga 2460 

tgagcagacg atggtgcagg atatcctgct gatgaagcag aacaacttta acgccgtgcg 2520 

ctgttcgcat tatccgaacc atccgctgtg gtacacgctg tgcgaccgct acggcctgta 2580 
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tgtggtggat 
tgatccgcgc 
taatcacccg 
cgacgcgctg 
cggcggagcc 
agaccagccc 
agagacgcgc 
tttcgctaaa 
ggactgggtg 
cggcggtgat 
tgccgaccgc 
gttccgttta 
taacgagctc 
gcctctggat 
ggagagcgcc 
gtcagaagcc 
gacgctcccc 
catcgagctg 
gtggattggc 
gctggataac 
acgctggaag 
tacacttgct 
cttatttatc 
tgatgttgaa 
ggcgcaggta 
ccgccttact 
gtacgtcttc 
acaccagtgg 
ggaaaccagc 
tttccatatg 
gctgagcgcc 
tggcagcagg 
ataagtgact 
gccgtctttt 
taggggtctt 
agttcctctg 
gaacccccca 
tgcaaaggcg 
atggctctcc 
tatgggatct 
aaacgtctag 
taccatgatt 
attcggctat 
gtcagcgcag 
actgcaggac 
tgtgctcgac 
gcaggatctc 
aatgcggcgg 
tcgcatcgag 
cgaagagcat 
cgacggcgag 
aaatggccgc 
ggacatagcg 
cttcctcgtg 
tcttgacgag 
tttagtctcc. 



taagtaacgc 
tcaaggtcag 
agttcctgcc 
atatctgtgg 
cggtccagcc 
ctgaaatgac 



gaagccaata 
tggctaccgg 
agtgtgatca 
tatcgctgga 
gacaccacgg 
ttcccggctg 
ccgctgatcc 
tactggcagg 
gatcagtcgc 
tttggcgata 
acgccgcatc 
tccgggcaaa 
ctgcactgga 
gtcgctccac 
gggcaactct 
gggcacatca 
gccgcgtccc 
ggtaataagc 
gataaaaaac 
gacattggcg 
gcggcgggcc 
gatgcggtgc 
agccggaaaa 
gtggcgagcg 
gcagagcggg 
gccgcctgtt 
ccgagcgaaa 
cgcggcgact 
catcgccatc 
gggattggtg 
ggtcgctacc 
ccttggcgcg 
gattagatgc 
ggcaatgtga 
tcccctctcg 
gaagcttctt 
cctggcgaca 
gcacaacccc 
tcaagcgtat 
gatctggggc 
gccccccgaa 
gaacaagatg 
gactgggcac 
gggcgcccgg 
gaggcagcgc 
gttgtcactg 
ctgtcatctc 
ctgcatacgc 
cgagcacgta 
caggggctcg 
gatctcgtcg 
ttttctggat 
ttggctaccc 
ctttacggta 
ttcttctgag 
agaaaaaggg 



cattttgcaa 
gaacagatgg 
ccggctcagg 
taagcagttc 
ctcagcagtt 
cctgtgcctt 



ttgaaaccca 
cgatgagcga 
tctggtcgct 
tcaaatctgt 
ccaccgatat 
tgccgaaatg 
tttgcgaata 
cgtttcgtca 
tgattaaata 
cgccgaacga 
cagcgctgac 
ccatcgaagt 
tggtggcgct 
aaggtaaaca 
ggctcacagt 
gcgcctggca 
acgccatccc 
gttggcaatt 
aactgctgac 
taagtgaagc 
attaccaggc 
tgattacgac 
cctaccggat 
atacaccgca 
taaactggct 
ttgaccgctg 
acggtctgcg 
tccagttcaa 
tgctgcacgc 
gcgacgactc 
attaccagtt 
ccggatcctt 
attgatccct 
gggcccggaa 
ccaaaggaat 
gaagacaaac 
ggtgcctctg 
agtgccacgt 
tcaacaaggg 
ctcggtgcac 
ccacggggac 
gattgcacgc 
aacagacaat 
ttctttttgt 
ggctatcgtg 
aagcgggaag 
accttgctcc 
ttgatccggc 
ctcggatgga 
cgccagccga 
tgacccatgg 
tcatcgactg 
gtgatattgc 
tcgccgctcc 
cgggactctg 
gggaatgaaa 



cggcatggtg 
acgcgtaacg 
ggggaatgaa 
cgatccttcc 
tatttgcccg 
gtccatcaaa 
cgcccacgcg 
gtatccccgt 
tgatgaaaac 
tcgccagttc 
ggaagcaaaa 
gaccagcgaa 
ggatggtaag 
gttgattgaa 
acgcgtagtg 
gcagtggcgt 
gcatctgacc 
taaccgccag 
gccgctgcgc 
gacccgcatt 
cgaagcagcg 
cgctcacgcg 
tgatggtagt 
tccggcgcgg 
cggattaggg 
ggatctgcca 
ctgcgggacg 
catcagccgc 
ggaagaaggc 
ctggagcccg 
ggtctggtgt 
aattaacaat 
cgaccaattc 
acctggccct 
gcaaggtctg 
aacgtctgta 
cggccaaaag 
tgtgagttgg 
gctgaaggat 
atgctttaca 
gtggttttcc 
aggttctccg 
cggctgctct 
caagaccgac 
gctggccacg 
ggactggctg 
tgccgagaaa 
tacctgccca 
agccggtctt 
actgttcgcc 
cgatgcctgc 
tggccggctg 
tgaagagctt 
cgattcgcag 
gggttcgcat 
gaccccacct 



ccaatgaatc 
cgaatggtgc 
tcaggccacg 
cgcccggtgc 
atgtacgcgc 
aaatggcttt 
atgggtaaca 
ttacagggcg 
ggcaacccgt 
tgtatgaacg 
caccagcagc 
tacctgttcc 
ccgctggcaa 
ctgcctgaac 
caaccgaacg 
ctggcggaaa 
accagcgaaa 
tcaggctttc 
gatcagttca 
gaccctaacg 
ttgttgcagt 
tggcagcatc 
ggtcaaatgg 
attggcctga 
ccgcaagaaa 
ttgtcagaca 
cgcgaattga 
tacagtcaac 
acatggctga 
tcagtatcgg 
caaaaaagat 
tgaccggtaa 
cggttatttt 
gtcttcttga 
ttgaatgtcg 
gcgacccttt 
ccacgtgtat 
atagttgtgg 
gcccagaagg 
tgtgtttagt 
tttgaaaaac 
gccgcttggg 
gatgccgccg 
ctgtccggtg 
acgggcgttc 
ctattgggcg 
gtatccatca 
ttcgaccacc 
gtcgatcagg 
aggctcaagg 
ttgccgaata 
ggtgtggcgg 
ggcggcgaat 
cgcatcgcct 
cgataaaata 
qtaqqtttqq 



gtctgaccga 
agcgcgatcg 
gcgctaatca 
agtatgaagg 
gcgtggatga 
cgctacctgg 
gtcttggcgg 
gcttcgtctg 
ggtcggctta 
gtctggtctt 
agtttttcca 
gtcatagcga 
gcggtgaagt 
taccgcagcc 
cgaccgcatg 
acctcagtgt 
tggatttttg 
tttcacagat 
cccgtgcacc 
cctgggtcga 
gcacggcaga 
aggggaaaac 
cgattaccgt 
actgccagct 
actatcccga 
tgtatacccc 
attatggccc 
agcaactgat 
atatcgacgg 
cggaattcca 
ctggaggtgg 
taataggtag 
ccaccatatt 
cgagcattcc 
tgaaggaagc 
gcaggcagcg 
aagatacacc 
aaagagtcaa 
taccccattg 
cgaggttaaa 
acgatgataa 
tggagaggct 
tgttccggct 
ccctgaatga 
cttgcgcagc 
aagtgccggg 
tggctgatgc 
aagcgaaaca 
atgatctgga 
cgcgcatgcc 
tcatggtgga 
accgctatca 
gggctgaccg 
tctatcgcct 
aaagatttta 
caaqctaqct 



2640 
2700 
2760 
2820 
2880 
2940 
3000 
3060 
3120 
3180 
3240 
3300 
3360 
3420 
3480 
3540 
3600 
3660 
3720 
3780 
3840 
3900 
3960 
4020 
4080 
4140 
4200 
4260 
4320 
4380 
4440 
4500 
4560 
4620 
4680 
4740 
4800 
4860 
4920 
4980 
5040 
5100 
5160 
5220 
5280 
5340 
5400 
5460 
5520 
5580 
5640 
5700 
5760 
5820 
5880 
5940 



ggcatggaaa 
aacagctgaa 
gccaagaaca 
ctgccccggc 
tctagagaac 
atttgaacta 



aatacataac 
tatgggccaa 
gatggaacag 
tcagggccaa 
catcagatgt 
accaatcagt 



tgagaataga 
acaggatatc 
ctgaatatgg 
gaacagatgg 
ttccagggtg 
tcgcttctcg 



gaagttcaga 
tgtggtaagc 
gccaaacagg 
tccccagatg 
ccccaaggac 
cttctgttcg 



6000 
6060 
6120 
6180 
6240 
6300 
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0^ 



cgcgcttctg ctccccgagc tcaataaaag agcccacaac ccctcactcg gggcgccagt 6360 
cctccgattg actgagtcgc ccgggtaccc gtgtatccaa taaaccctct tgcagttgca 6420 
tccgacttgt ggtctcgctg ttccttggga gggtctcctc tgagtgattg actacccgtc 6480 
agcgggggtc tttcattcat gcagcatgta tcaaaattaa tttggttttt tttcttaagt 6540 
atttacatta aatggccata gttgcattaa tgaatcggcc aacgcgcggg gagaggcggt 6600 
ttgcgtattg gcgctcttcc gcttcctcgc tcactgactc gctgcgctcg gtcgttcggc 6660 
tgcggcgagc ggtatcagct cactcaaagg cggtaatacg gttatccaca gaatcagggg 6720 
ataacgcagg aaagaacatg tgagcaaaag gccagcaaaa ggccaggaac cgtaaaaagg 6780 
ccgcgttgct ggcgtttttc cataggctcc gcccccctga cgagcatcac aaaaatcgac 6840 
gctcaagtca gaggtggcga aacccgacag gactataaag ataccaggcg tttccccctg 6900 
gaagctccct cgtgcgctct cctgttccga ccctgccgct taccggatac ctgtccgcct 6960 
ttctcccttc gggaagcgtg gcgctttctc atagctcacg ctgtaggtat ctcagttcgg 7020 
tgtaggtcgt tcgctccaag ctgggctgtg tgcacgaacc ccccgttcag cccgaccgct 7080 
gcgccttatc cggtaactat cgtcttgagt ccaacccggt aagacacgac ttatcgccac 7140 
tggcagcagc cactggtaac aggattagca gagcgaggta tgtaggcggt gctacagagt 7200 
tcttgaagtg gtggcctaac tacggctaca ctagaagaac agtatttggt atctgcgctc 7260 
tgctgaagcc agttaccttc ggaaaaagag ttggtagctc ttgatccggc aaacaaacca 7320 
ccgctggtag cggtggtttt tttgtttgca agcagcagat tacgcgcaga aaaaaaggat 7380 
ctcaagaaga tcctttgatc ttttctacgg ggtctgacgc tcagtggaac gaaaactcac 7440 
gttaagggat tttggtcatg agattatcaa aaaggatctt cacctagatc cttttgcggc 7500 
cgcaaatcaa tctaaagtat atatgagtaa acttggtctg acagttacca atgcttaatc 7560 
agtgaggcac ctatctcagc gatctgtcta tttcgttcat ccatagttgc ctgactcccc 7620 
gtcgtgtaga taactacgat acgggagggc ttaccatctg gccccagtgc tgcaatgata 7680 
ccgcgagacc cacgctcacc ggctccagat ttatcagcaa taaaccagcc agccggaagg 7740 
gccgagcgca gaagtggtcc tgcaacttta tccgcctcca tccagtctat taattgttgc 7800 
cgggaagcta gagtaagtag ttcgccagtt aatagtttgc gcaacgttgt tgccattgct 7860 
acaggcatcg tggtgtcacg ctcgtcgttt ggtatggctt cattcagctc cggttcccaa 7920 
cgatcaaggc gagttacatg atcccccatg ttgtgcaaaa aagcggttag ctccttcggt 7980 
cctccgatcg ttgtcagaag taagttggcc gcagtgttat cactcatggt tatggcagca 8040 
ctgcataatt ctcttactgt catgccatcc gtaagatgct tttctgtgac tggtgagtac 8100 
tcaaccaagt cattctgaga atagtgtatg cggcgaccga gttgctcttg cccggcgtca 8160 
atacgggata ataccgcgcc acatagcaga actttaaaag tgctcatcat tggaaaacgt 8220 
tcttcggggc gaaaactctc aaggatctta ccgctgttga gatccagttc gatgtaaccc 8280 
actcgtgcac ccaactgatc ttcagcatct tttactttca ccagcgtttc tgggtgagca 8340 
aaaacaggaa ggcaaaatgc cgcaaaaaag ggaataaggg cgacacggaa atgttgaata 8400 
ctcatactct tcctttttca atattattga agcatttatc agggttattg tctcatgagc 8460 
ggatacatat ttgaatgtat ttagaaaaat aaacaaatag gggttccgcg cacatttc 8518 

<210> 4 
<211> 8175 
<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Nucleotide sequence for pICAST OMC 
<400> 4 

ctgcagcctg aatatgggcc aaacaggata tctgtggtaa gcagttcctg ccccggctca 60 

gggccaagaa cagatggaac agctgaatat gggccaaaca ggatatctgt ggtaagcagt 120 

tcctgccccg gctcagggcc aagaacagat ggtccccaga tgcggtccag ccctcagcag 180 

tttctagaga accatcagat gtttccaggg tgccccaagg acctgaaatg accctgtgcc 240 

ttatttgaac taaccaatca gttcgcttct cgcttctgtt cgcgcgcttc tgctccccga 300 

gctcaataaa agagcccaca acccctcact cggggcgcca gtcctccgat tgactgagtc 360 

gcccgggtac ccgtgtatcc aataaaccct cttgcagttg catccgactt gtggtctcgc 420 

tgttccttgg gagggtctcc tctgagtgat tgactacccg tcagcggggg tctttcattt 480 

qqgggctcqt ccqqqatcqq gaqacccctg cccaqqcracc accqacccac caccqggaqg 540 

caagctggcc agcaacttat ctgtgtctgt ccgattgtct agtgtctatg actgatttta 600 

tgcgcctgcg tcggtactag ttagctaact agctctgtat ctggcggacc cgtggtggaa 660 

ctgacgagtt ctgaacaccc ggccgcaacc ctgggagacg tcccagggac tttgggggcc 720 

gtttttgtgg cccgacctga ggaagggagt cgatgtggaa tccgaccccg tcaggatatg 780 

tggttctggt aggagacgag aacctaaaac agttcccgcc tccgtctgaa tttttgcttt 840 

cggtttggaa ccgaagccgc gcgtcttgtc tgctgcagca tcgttctgtg ttgtctctgt 900 
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ctgactgtgt ttctgtattt gtctgaaaat tagggccaga ctgttaccac tcccttaagt 960 
ttgaccttag gtaactggaa agatgtcgag cggctcgctc acaaccagtc ggtagatgtc 1020 
aagaagagac gttgggttac cttctgctct gcagaatggc caacctttaa cgtcggatgg 1080 
ccgcgagacg gcacctttaa ccgagacctc atcacccagg ttaagatcaa ggtcttttca 1140 
cctggcccgc atggacaccc agaccaggtc ccctacatcg tgacctggga agccttggct 1200 
tttgaccccc ctccctgggt caagcccttt gtacacccta agcctccgcc tcctcttcct 1260 
ccatccgccc cgtctctccc ccttgaacct cctcgttcga ccccgcctcg atcctccctt 1320 
tatccagccc tcactccttc tctaggcgcc ggccgctcta gcccattaat acgactcact 1380 
atagggcgat tcgaatcagg ccttggcgcg ccggatcctt aattaagcgc aattgggagg 1440 
tggcggtagc ctcgagatgg gcgtgattac ggattcactg gccgtcgttt tacaacgtcg 1500 
tgactgggaa aaccctggcg ttacccaact taatcgcctt gcagcacatc cccctttcgc 1560 
cagctggcgt aatagcgaag aggcccgcac cgatcgccct tcccaacagt tacgcagcct 1620 
gaatggcgaa tggcgctttg cctggtttcc ggcaccagaa gcggtgccgg aaagctggct 1680 
ggagtgcgat cttcctgagg ccgatactgt cgtcgtcccc tcaaactggc agatgcacgg 1740 
ttacgatgcg cccatctaca ccaacgtgac ctatcccatt acggtcaatc cgccgtttgt 1800 
tcccacggag aatccgacgg gttgttactc gctcacattt aatgttgatg aaagctggct 1860 
acaggaaggc cagacgcgaa ttatttttga tggcgttaac tcggcgtttc atctgtggtg 1920 
caacgggcgc tgggtcggtt acggccagga cagtcgtttg ccgtctgaat ttgacctgag 1980 
cgcattttta cgcgccggag aaaaccgcct cgcggtgatg gtgctgcgct ggagtgacgg 2040 
cagttatctg gaagatcagg atatgtggcg gatgagcggc attttccgtg acgtctcgtt 2100 
gctgcataaa ccgactacac aaatcagcga tttccatgtt gccactcgct ttaatgatga 2160 
tttcagccgc gctgtactgg aggctgaagt tcagatgtgc ggcgagttgc gtgactacct 2220 
acgggtaaca gtttctttat ggcagggtga aacgcaggtc gccagcggca ccgcgccttt 2280 
cggcggtgaa attatcgatg agcgtggtgg ttatgccgat cgcgtcacac tacgtctgaa 2340 
cgtcgaaaac ccgaaactgt ggagcgccga aatcccgaat ctctatcgtg cggtggttga 2400 
actgcacacc gccgacggca cgctgattga agcagaagcc tgcgatgtcg gtttccgcga 24 60 
ggtgcggatt gaaaatggtc tgctgctgct gaacggcaag ccgttgctga ttcgaggcgt 2520 
taaccgtcac gagcatcatc ctctgcatgg tcaggtcatg gatgagcaga cgatggtgca 2580 
ggatatcctg ctgatgaagc agaacaactt taacgccgtg cgctgttcgc attatccgaa 2640 
ccatccgctg tggtacacgc tgtgcgaccg ctacggcctg tatgtggtgg atgaagccaa 2700 
tattgaaacc cacggcatgg tgccaatgaa tcgtctgacc gatgatccgc gctggctacc 2760 
ggcgatgagc gaacgcgtaa cgcgaatggt gcagcgcgat cgtaatcacc cgagtgtgat 2820 
catctggtcg ctggggaatg aatcaggcca cggcgctaat cacgacgcgc tgtatcgctg 2880 
gatcaaatct gtcgatcctt cccgcccggt gcagtatgaa ggcggcggag ccgacaccac 2940 
ggccaccgat attatttgcc cgatgtacgc gcgcgtggat gaagaccagc ccttcccggc 3000 
tgtgccgaaa tggtccatca aaaaatggct ttcgctacct ggagagacgc gcccgctgat 3060 
cctttgcgaa tacgcccacg cgatgggtaa cagtcttggc ggtttcgcta aatactggca 3120 
ggcgtttcgt cagtatcccc gtttacaggg cggcttcgtc tgggactggg tggatcagtc 3180 
gctgattaaa tatgatgaaa acggcaaccc gtggtcggct tacggcggtg attttggcga 3240 
tacgccgaac gatcgccagt tctgtatgaa cggtctggtc tttgccgacc gcacgccgca 3300 
tccagcgctg acggaagcaa aacaccagca gcagtttttc cagttccgtt tatccgggca 3360 
aaccatcgaa gtgaccagcg aatacctgtt ccgtcatagc gataacgagc tcctgcactg 3420 
gatggtggcg ctggatggta agccgctggc aagcggtgaa gtgcctctgg atgtcgctcc 3480 
acaaggtaaa cagttgattg aactgcctga actaccgcag ccggagagcg ccgggcaact 3540 
ctggctcaca gtacgcgtag tgcaaccgaa cgcgaccgca tggtcagaag ccgggcacat 3600 
cagcgcctgg cagcagtggc gtctggcgga aaacctcagt gtgacgctcc ccgccgcgtc 3660 
ccacgccatc ccgcatctga ccaccagcga aatggatttt tgcatcgagc tgggtaataa 3720 
gcgttggcaa tttaaccgcc agtcaggctt tctttcacag atgtggattg gcgataaaaa 3780 
acaactgctg acgccgctgc gcgatcagtt cacccgtgtc gatagatctg aacagaaact 3840 
catttccgaa gaagacctag tcgaccatca tcatcatcat caccggtaat aataggtaga 3900 
taagtgactg attagatgca tttcgactag atccctcgac caattccggt tattttccac 3960 
catattgccg tcttttggca atgtgagggc ccggaaacct ggccctgtct tcttgacgag 4020 
cattcctagg ggtctttccc ctctcgccaa aggaatgcaa ggtctgttga atgtcgtgaa 4080 
ggaagcagtt cctctggaag cttcttgaag acaaacaacg tctgtagcga ccctttgcag 4140 
gcagcggaac cccccacctg gcgacaggtg cctctgcggc caaaagccac gtgtataaga 4200 
tacacctgca aaggcggcac aaccccagtg ccacgttgtg agttggatag ttgtggaaag 4260 



agtcaaatgg ctctcctcaa gcgtattcaa caaggggctg aaggatgccc agaaggtacc 4320 

ccattgtatg ggatctgatc tggggcctcg gtgcacatgc tttacatgtg tttagtcgag 4380 

gttaaaaaac gtctaggccc cccgaaccac ggggacgtgg ttttcctttg aaaaacacga 4440 

tgataatacc atgaaaaagc ctgaactcac cgcgacgtct gtcgagaagt ttctgatcga 4500 

aaagttcgac agcgtctccg acctgatgca gctctcggag ggcgaagaat ctcgtgcttt 4560 

cagcttcgat gtaggagggc gtggatatgt cctgcgggta aatagctgcg ccgatggttt 4620 
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ctacaaagat cgttatgttt atcggcactt tgcatcggcc gcgctcccga ttccggaagt 4680 

gcttgacatt ggggaattta gcgagagcct gacctattgc atctcccgcc gtgcacaggg 4740 

tgtcacgttg caagacctgc ctgaaaccga actgcccgct gttctgcagc cggtcgcgga 4800 

ggccatggat gcgatcgctg cggccgatct tagccagacg agcgggttcg gcccattcgg 4860 

accgcaagga atcggtcaat acactacatg gcgtgatttc atatgcgcga ttgctgatcc 4920 

ccatgtgtat cactggcaaa ctgtgatgga cgacaccgtc agtgcgtccg tcgcgcaggc 4980 

tctcgatgag ctgatgcttt gggccgagga ctgccccgaa gtccggcacc tcgtgcacgc 5040 

ggatttcggc tccaacaatg tcctgacgga caatggccgc ataacagcgg tcattgactg 5100 

gagcgaggcg atgttcgggg attcccaata cgaggtcgcc aacatcttct tctggaggcc 5160 

gtggttggct tgtatggagc agcagacgcg ctacttcgag cggaggcatc cggagcttgc 5220 

aggatcgccg cggctccggg cgtatatgct ccgcattggt cttgaccaac tctatcagag 5280 

cttggttgac ggcaatttcg atgatgcagc ttgggcgcag ggtcgatgcg acgcaatcgt 5340 

ccgatccgga gccgggactg tcgggcgtac acaaatcgcc cgcagaagcg cggccgtctg 5400 

gaccgatggc tgtgtagaag tactcgccga tagtggaaac cgacgcccca gcactcgtcc 54 60 

gagggcaaag gaatagagta gatgccgacc gggatctatc gataaaataa aagattttat 5520 

ttagtctcca gaaaaagggg ggaatgaaag accccacctg taggtttggc aagctagctt 5580 

aagtaacgcc attttgcaag gcatggaaaa atacataact gagaatagag aagttcagat 5640 

caaggtcagg aacagatgga acagctgaat atgggccaaa caggatatct gtggtaagca 5700 

gttcctgccc cggctcaggg ccaagaacag atggaacagc tgaatatggg ccaaacagga 5760 

tatctgtggt aagcagttcc tgccccggct cagggccaag aacagatggt ccccagatgc 5820 

ggtccagccc tcagcagttt ctagagaacc atcagatgtt tccagggtgc cccaaggacc 5880 

tgaaatgacc ctgtgcctta tttgaactaa ccaatcagtt cgcttctcgc ttctgttcgc 5940 

gcgcttctgc tccccgagct caataaaaga gcccacaacc cctcactcgg ggcgccagtc 6000 

ctccgattga ctgagtcgcc cgggtacccg tgtatccaat aaaccctctt gcagttgcat 6060 

ccgacttgtg gtctcgctgt tccttgggag ggtctcctct gagtgattga ctacccgtca 6120 

gcgggggtct ttcattcatg cagcatgtat caaaattaat ttggtttttt ttcttaagta 6180 

tttacattaa atggccatag ttgcattaat gaatcggcca acgcgcgggg agaggcggtt 6240 

tgcgtattgg cgctcttccg cttcctcgct cactgactcg ctgcgctcgg tcgttcggct 6300 

gcggcgagcg gtatcagctc actcaaaggc ggtaatacgg ttatccacag aatcagggga 6360 

taacgcagga aagaacatgt gagcaaaagg ccagcaaaag gccaggaacc gtaaaaaggc 6420 

cgcgttgctg gcgtttttcc ataggctccg cccccctgac gagcatcaca aaaatcgacg 6480 

ctcaagtcag aggtggcgaa acccgacagg actataaaga taccaggcgt ttccccctgg 6540 

aagctccctc gtgcgctctc ctgttccgac cctgccgctt accggatacc tgtccgcctt 6600 

tctcccttcg ggaagcgtgg cgctttctca tagctcacgc tgtaggtatc tcagttcggt 6660 

gtaggtcgtt cgctccaagc tgggctgtgt gcacgaaccc cccgttcagc ccgaccgctg 6720 

cgccttatcc ggtaactatc gtcttgagtc caacccggta agacacgact tatcgccact 6780 

ggcagcagcc actggtaaca ggattagcag agcgaggtat gtaggcggtg ctacagagtt 6840 

cttgaagtgg tggcctaact acggctacac tagaagaaca gtatttggta tctgcgctct 6900 

gctgaagcca gttaccttcg gaaaaagagt tggtagctct tgatccggca aacaaaccac 6960 

cgctggtagc ggtggttttt ttgtttgcaa gcagcagatt acgcgcagaa aaaaaggatc 7020 

tcaagaagat cctttgatct tttctacggg gtctgacgct cagtggaacg aaaactcacg 7080 

ttaagggatt ttggtcatga gattatcaaa aaggatcttc acctagatcc ttttaaatta 7140 

aaaatgaagt ttgcggccgc aaatcaatct aaagtatata tgagtaaact tggtctgaca 7200 

gttaccaatg cttaatcagt gaggcaccta tctcagcgat ctgtctattt cgttcatcca 7260 

tagttgcctg actccccgtc gtgtagataa ctacgatacg ggagggctta ccatctggcc 7320 

ccagtgctgc aatgataccg cgagacccac gctcaccggc tccagattta tcagcaataa 7380 

accagccagc cggaagggcc gagcgcagaa gtggtcctgc aactttatcc gcctccatcc 7440 

agtctattaa ttgttgccgg gaagctagag taagtagttc gccagttaat agtttgcgca 7500 

acgttgttgc cattgctaca ggcatcgtgg tgtcacgctc gtcgtttggt atggcttcat 7560 

tcagctccgg ttcccaacga tcaaggcgag ttacatgatc ccccatgttg tgcaaaaaag 7620 

cggttagctc cttcggtcct ccgatcgttg tcagaagtaa gttggccgca gtgttatcac 7680 

tcatggttat ggcagcactg cataattctc ttactgtcat gccatccgta agatgctttt 7740 

ctgtgactgg tgagtactca accaagtcat tctgagaata gtgtatgcgg cgaccgagtt 7800 

gctcttgccc ggcgtcaata cgggataata ccgcgccaca tagcagaact ttaaaagtgc 7860 

tcatcattqq aaaacgttct t cggggcgaa aactctcaag gatcttaccg ctgttgagat 7920 

nn^r^j-tnrj^t ghaar-nnar-r r-cjr r^n A nn n ^ ^ i ■ I ij: ^ 1- nt- 1- r- n rjn n 1- n1- M- 1- ^n.t 1 1 r^.;=i CCB 7980 

gcgtttctgg gtgagcaaaa acaggaaggc aaaatgccgc aaaaaaggga ataagggcga 8040 

cacggaaatg ttgaatactc atactcttcc tttttcaata ttattgaagc atttatcagg 8100 

gttattgtct catgagcgga tacatatttg aatgtattta gaaaaataaa caaatagggg 8160 

ttccgcgcac atttc 8175 
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<210> 5 
<211> 8175 
<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Nucleotide sequence for pICAST OMN 



<400> 5 

ctgcagcctg 

gggccaagaa 

tcctgccccg 

tttctagaga 

ttatttgaac 

gctcaataaa 

gcccgggtac 

tgttccttgg 

gggggctcgt 

caagctggcc 

tgcgcctgcg 

ctgacgagtt 

gtttttgtgg 

tggttctggt 

cggtttggaa 

ctgactgtgt 

ttgaccttag 

aagaagagac 

ccgcgagacg 

cctggcccgc 

tttgaccccc 

ccatccgccc 

tatccagccc 

atagggcgat 

tggcggtagc 

tgactgggaa 

cagctggcgt 

gaatggcgaa 

ggagtgcgat 

ttacgatgcg 

tcccacggag 

acaggaaggc 

caacgggcgc 

cgcattttta 

cagttatctg 

gctgcataaa 

tttcagccgc 

acgggtaaca 

cggcggtgaa 

cgtcgaaaac 

actgcacacc 

ggtgcggatt 

taaccgtcac 

ggatatcctg 

ccatccgctg 

tattgaaacc 

ggcqatgagc 



aatatgggcc 
cagatggaac 
gctcagggcc 
accatcagat 
taaccaatca 
agagcccaca 
ccgtgtatcc 
gagggtctcc 
ccgggatcgg 
agcaacttat 
tcggtactag 
ctgaacaccc 
cccgacctga 
aggagacgag 
ccgaagccgc 
ttctgtattt 
gtaactggaa 
gttgggttac 
gcacctttaa 
atggacaccc 
ctccctgggt 
cgtctctccc 
tcactccttc 
tcgaatcagg 
ctcgagatgg 
aaccctggcg 
aatagcgaag 
tggcgctttg 
cttcctgagg 
cccatctaca 
aatccgacgg 
cagacgcgaa 
tgggtcggtt 
cgcgccggag 
gaagatcagg 
ccgactacac 
gctgtactgg 
gtttctttat 
attatcgatg 
ccgaaactgt 
gccgacggca 
gaaaatggtc 
gagcatcatc 
ctgatgaagc 
tggtacacgc 
cacggcatgg 
gaangr. gfa a 



aaacaggata 
agctgaatat 
aagaacagat 
gtttccaggg 
gttcgcttct 
acccctcact 
aataaaccct 
tctgagtgat 
gagacccctg 
ctgtgtctgt 
ttagctaact 
ggccgcaacc 
ggaagggagt 
aacctaaaac 
gcgtcttgtc 
gtctgaaaat 
agatgtcgag 
cttctgctct 
ccgagacctc 
agaccaggtc 
caagcccttt 
ccttgaacct 
tctaggcgcc 
ccttggcgcg 
gcgtgattac 
ttacccaact 
aggcccgcac 
cctggtttcc 
ccgatactgt 
ccaacgtgac 
gttgttactc 
ttatttttga 
acggccagga 
aaaaccgcct 
atatgtggcg 
aaatcagcga 
aggctgaagt 
ggcagggtga 
agcgtggtgg 
ggagcgccga 
cgctgattga 
tgctgctgct 
ctctgcatgg 
agaacaactt 
tgtgcgaccg 
tgccaatgaa 
r.gr.g^a1-g g1- 



tctgtggtaa 
gggccaaaca 
ggtccccaga 
tgccccaagg 
cgcttctgtt 
cggggcgcca 
cttgcagttg 
tgactacccg 
cccagggacc 
ccgattgtct 
agctctgtat 
ctgggagacg 
cgatgtggaa 
agttcccgcc 
tgctgcagca 
tagggccaga 
cggctcgctc 
gcagaatggc 
atcacccagg 
ccctacatcg 
gtacacccta 
cctcgttcga 
ggccgctcta 
ccggatcctt 
ggattcactg 
taatcgcctt 
cgatcgccct 
ggcaccagaa 
cgtcgtcccc 
ctatcccatt 
gctcacattt 
tggcgttaac 
cagtcgtttg 
cgcggtgatg 
gatgagcggc 
tttccatgtt 
tcagatgtgc 
aacgcaggtc 
ttatgccgat 
aatcccgaat 
agcagaagcc 
gaacggcaag 
tcaggtcatg 
taacgccgtg 
ctacggcctg 
tcgtctgacc 
gcagcgcgat 



gcagttcctg 
ggatatctgt 
tgcggtccag 
acctgaaatg 
cgcgcgcttc 
gtcctccgat 
catccgactt 
tcagcggggg 
accgacccac 
agtgtctatg 
ctggcggacc 
tcccagggac 
tccgaccccg 
tccgtctgaa 
tcgttctgtg 
ctgttaccac 
acaaccagtc 
caacctttaa 
ttaagatcaa 
tgacctggga 
agcctccgcc 
ccccgcctcg 
gcccattaat 
aattaagcgc 
gccgtcgttt 
gcagcacatc 
tcccaacagt 
gcggtgccgg 
tcaaactggc 
acggtcaatc 
aatgttgatg 
tcggcgtttc 
ccgtctgaat 
gtgctgcgct 
attttccgtg 
gccactcgct 
ggcgagttgc 
gccagcggca 
cgcgtcacac 
ctctatcgtg 
tgcgatgtcg 
ccgttgctga 
gatgagcaga 
cgctgttcgc 
tatgtggtgg 
gatgatccgc 
cgtaatcacc 



ccccggctca 
ggtaagcagt 
ccctcagcag 
accctgtgcc 
tgctccccga 
tgactgagtc 
gtggtctcgc 
tctttcattt 
caccgggagg 
actgatttta 
cgtggtggaa 
tttgggggcc 
tcaggatatg 
tttttgcttt 
ttgtctctgt 
tcccttaagt 
ggtagatgtc 
cgtcggatgg 
ggtcttttca 
agccttggct 
tcctcttcct 
atcctccctt 
acgactcact 
aattgggagg 
tacaacgtcg 
cccctttcgc 
tacgcagcct 
aaagctggct 
agatgcacgg 
cgccgtttgt 
aaagctggct 
atctgtggtg 
ttgacctgag 
ggagtgacgg 
acgtctcgtt 
ttaatgatga 
gtgactacct 
ccgcgccttt 
tacgtctgaa 
cggtggttga 
gtttccgcga 
ttcgaggcgt 
cgatggtgca 
attatccgaa 
atgaagccaa 
gctggctacc 
cqaqtqtqat 



60 

120 

180 

240 

300 

360 

420 

480 

540 

600 

660 

720 

780 

840 

900 

960 

1020 

1080 

1140 

1200 

1260 

1320 

1380 

1440 

1500 

1560 

1620 

1680 

1740 

1800 

1860 

1920 

1980 

2040 

2100 

2160 

2220 

2280 

2340 

2400 

2460 

2520 

2580 

2640 

2700 

2760 

2820 



catctggtcg 
gatcaaatct 
ggccaccgat 
tgtgccgaaa 
cctttgcgaa 
ggcgtttcgt 



ctggggaatg 
gtcgatcctt 
attatttgcc 
tggtccatca 
tacgcccacg 
cagtatcccc 



aatcaggcca 
cccgcccggt 
cgatgtacgc 
aaaaatggct 
cgatgggtaa 
gtttacaggg 



cggcgctaat 
gcagtatgaa 
gcgcgtggat 
ttcgctacct 
cagtcttggc 
cggcttcgtc 



cacgacgcgc 
ggcggcggag 
gaagaccagc 
ggagagacgc 
ggtttcgcta 
tgggactggg 



tgtatcgctg 
ccgacaccac 
ccttcccggc 
gcccgctgat 
aatactggca 
tggatcagtc 



2880 
2940 
3000 
3060 
3120 
3180 
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gctgattaaa 
tacgccgaac 
tccagcgctg 
aaccatcgaa 
gatggtggcg 
acaaggtaaa 
ctggctcaca 
cagcgcctgg 
ccacgccatc 
gcgttggcaa 
acaactgctg 
catttccgaa 
taagtgactg 
catattgccg 
cattcctagg 
ggaagcagtt 
gcagcggaac 
tacacctgca 
agtcaaatgg 
ccattgtatg 
gttaaaaaac 
tgataatacc 
aaagttcgac 
cagcttcgat 
ctacaaagat 
gcttgacatt 
tgtcacgttg 
ggccatggat 
accgcaagga 
ccatgtgtat 
tctcgatgag 
ggatttcggc 
gagcgaggcg 
gtggttggct 
aggatcgccg 
cttggttgac 
ccgatccgga 
gaccgatggc 
gagggcaaag 
ttagtctcca 
aagtaacgcc 
caaggtcagg 
gttcctgccc 
tatctgtggt 
ggtccagccc 
tgaaatgacc 
gcgcttctgc 
ctccgattga 
ccgacttgtg 
gcgggggtct 
tttacattaa 
tgcgtattgg 
gcggcgagcg 
taacgcagga 
cgcgttgctg 
(J Ltjctay Luag 
aagctccctc 
tctcccttcg 
gtaggtcgtt 
cgccttatcc 
ggcagcagcc 
cttgaagtgg 



tatgatgaaa 
gatcgccagt 
acggaagcaa 
gtgaccagcg 
ctggatggta 
cagttgattg 
gtacgcgtag 
cagcagtggc 
ccgcatctga 
tttaaccgcc 
acgccgctgc 
gaagacctag 
attagatgca 
tcttttggca 
ggtctttccc 
cctctggaag 
cccccacctg 
aaggcggcac 
ctctcctcaa 
ggatctgatc 
gtctaggccc 
atgaaaaagc 
agcgtctccg 
gtaggagggc 
cgttatgttt 
ggggaattta 
caagacctgc 
gcgatcgctg 
atcggtcaat 
cactggcaaa 
ctgatgcttt 
tccaacaatg 
atgttcgggg 
tgtatggagc 
cggctccggg 
ggcaatttcg 
gccgggactg 
tgtgtagaag 
gaatagagta 
gaaaaagggg 
attttgcaag 
aacagatgga 
cggctcaggg 
aagcagttcc 
tcagcagttt 
ctgtgcctta 
tccccgagct 
ctgagtcgcc 
gtctcgctgt 
ttcattcatg 
atggccatag 
cgctcttccg 
gtatcagctc 
aagaacatgt 
gcgtttttcc 
- aggtggcgaa 



gtgcgctctc 
ggaagcgtgg 
cgctccaagc 
ggtaactatc 
actggtaaca 
tggcctaact 



acggcaaccc 
tctgtatgaa 
aacaccagca 
aatacctgtt 
agccgctggc 
aactgcctga 
tgcaaccgaa 
gtctggcgga 
ccaccagcga 
agtcaggctt 
gcgatcagtt 
tcgaccatca 
tttcgactag 
atgtgagggc 
ctctcgccaa 
cttcttgaag 
gcgacaggtg 
aaccccagtg 
gcgtattcaa 
tggggcctcg 
cccgaaccac 
ctgaactcac 
acctgatgca 
gtggatatgt 
atcggcactt 
gcgagagcct 
ctgaaaccga 
cggccgatct 
acactacatg 
ctgtgatgga 
gggccgagga 
tcctgacgga 
attcccaata 
agcagacgcg 
cgtatatgct 
atgatgcagc 
tcgggcgtac 
tactcgccga 
gatgccgacc 
ggaatgaaag 
gcatggaaaa 
acagctgaat 
ccaagaacag 
tgccccggct 
ctagagaacc 
tttgaactaa 
caataaaaga 
cgggtacccg 
tccttgggag 
cagcatgtat 
ttgcattaat 
cttcctcgct 
actcaaaggc 
gagcaaaagg 
ataggctccg 
a cccgaca gg- 



ctgttccgac 
cgctttctca 
tgggctgtgt 
gtcttgagtc 
ggattagcag 
acggctacac 



gtggtcggct 
cggtctggtc 
gcagtttttc 
ccgtcatagc 
aagcggtgaa 
actaccgcag 
cgcgaccgca 
aaacctcagt 
aatggatttt 
tctttcacag 
cacccgtgtc 
tcatcatcat 
atccctcgac 
ccggaaacct 
aggaatgcaa 
acaaacaacg 
cctctgcggc 
ccacgttgtg 
caaggggctg 
gtgcacatgc 
ggggacgtgg 
cgcgacgtct 
gctctcggag 
cctgcgggta 
tgcatcggcc 
gacctattgc 
actgcccgct 
tagccagacg 
gcgtgatttc 
cgacaccgtc 
ctgccccgaa 
caatggccgc 
cgaggtcgcc 
ctacttcgag 
ccgcattggt 
ttgggcgcag 
acaaatcgcc 
tagtggaaac 
gggatctatc 
accccacctg 
atacataact 
atgggccaaa 
atggaacagc 
cagggccaag 
atcagatgtt 
ccaatcagtt 
gcccacaacc 
tgtatccaat 
ggtctcctct 
caaaattaat 
gaatcggcca 
cactgactcg 
ggtaatacgg 
ccagcaaaag 
cccccctgac 
-actataaaga 



tacggcggtg 
tttgccgacc 
cagttccgtt 
gataacgagc 
gtgcctctgg 
ccggagagcg 
tggtcagaag 
gtgacgctcc 
tgcatcgagc 
atgtggattg 
gatagatctg 
caccggtaat 
caattccggt 
ggccctgtct 
ggtctgttga 
tctgtagcga 
caaaagccac 
agttggatag 
aaggatgccc 
tttacatgtg 
ttttcctttg 
gtcgagaagt 
ggcgaagaat 
aatagctgcg 
gcgctcccga 
atctcccgcc 
gttctgcagc 
agcgggttcg 
atatgcgcga 
agtgcgtccg 
gtccggcacc 
ataacagcgg 
aacatcttct 
cggaggcatc 
cttgaccaac 
ggtcgatgcg 
cgcagaagcg 
cgacgcccca 
gataaaataa 
taggtttggc 
gagaatagag 
caggatatct 
tgaatatggg 
aacagatggt 
tccagggtgc 
cgcttctcgc 
cctcactcgg 
aaaccctctt 
gagtgattga 
ttggtttttt 
acgcgcgggg 
ctgcgctcgg 
ttatccacag 
gccaggaacc 
gagcatcaca 
taccaggcg^ 



attttggcga 
gcacgccgca 
tatccgggca 
tcctgcactg 
atgtcgctcc 
ccgggcaact 
ccgggcacat 
ccgccgcgtc 
tgggtaataa 
gcgataaaaa 
aacagaaact 
aataggtaga 
tattttccac 
tcttgacgag 
atgtcgtgaa 
ccctttgcag 
gtgtataaga 
ttgtggaaag 
agaaggtacc 
tttagtcgag 
aaaaacacga 
ttctgatcga 
ctcgtgcttt 
ccgatggttt 
ttccggaagt 
gtgcacaggg 
cggtcgcgga 
gcccattcgg 
ttgctgatcc 
tcgcgcaggc 
tcgtgcacgc 
tcattgactg 
tctggaggcc 
cggagcttgc 
tctatcagag 
acgcaatcgt 
cggccgtctg 
gcactcgtcc 
aagattttat 
aagctagctt 
aagttcagat 
gtggtaagca 
ccaaacagga 
ccccagatgc 
cccaaggacc 
ttctgttcgc 
ggcgccagtc 
gcagttgcat 
ctacccgtca 
ttcttaagta 
agaggcggtt 
tcgttcggct 
aatcagggga 
gtaaaaaggc 
aaaatcgacg 
ttccccctqg 



3240 
3300 
3360 
3420 
3480 
3540 
3600 
3660 
3720 
3780 
3840 
3900 
3960 
4020 
4080 
4140 
4200 
4260 
4320 
4380 
4440 
4500 
4560 
4620 
4680 
4740 
4800 
4860 
4920 
4980 
5040 
5100 
5160 
5220 
5280 
5340 
5400 
5460 
5520 
5580 
5640 
5700 
5760 
5820 
5880 
5940 
6000 
6060 
6120 
6180 
6240 
6300 
6360 
6420 
6480 
6540 



cctgccgctt 
tagctcacgc 
gcacgaaccc 
caacccggta 
agcgaggtat 
tagaagaaca 



accggatacc 
tgtaggtatc 
cccgttcagc 
agacacgact 
gtaggcggtg 
gtatttggta 



tgtccgcctt 
tcagttcggt 
ccgaccgctg 
tatcgccact 
ctacagagtt 
tctgcgctct 



6600 
6660 
6720 
6780 
6840 
6900 
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gctgaagcca 
cgctggtagc 
tcaagaagat 
ttaagggatt 
aaaatgaagt 
gttaccaatg 
tagttgcctg 
ccagtgctgc 
accagccagc 
agtctattaa 
acgttgttgc 
tcagctccgg 
cggttagctc 
tcatggttat 
ctgtgactgg 
gctcttgccc 
tcatcattgg 
ccagttcgat 
gcgtttctgg 
cacggaaatg 
gttattgtct 
ttccgcgcac 



gttaccttcg 
ggtggttttt 
cctttgatct 
ttggtcatga 
ttgcggccgc 
cttaatcagt 
actccccgtc 
aatgataccg 
cggaagggcc 
ttgttgccgg 
cattgctaca 
ttcccaacga 
cttcggtcct 
ggcagcactg 
tgagtactca 
ggcgtcaata 
aaaacgttct 
gtaacccact 
gtgagcaaaa 
ttgaatactc 
catgagcgga 
atttc 



gaaaaagagt 
ttgtttgcaa 
tttctacggg 
gattatcaaa 
aaatcaatct 
gaggcaccta 
gtgtagataa 
cgagacccac 
gagcgcagaa 
gaagctagag 
ggcatcgtgg 
tcaaggcgag 
ccgatcgttg 
cataattctc 
accaagtcat 
cgggataata 
tcggggcgaa 
cgtgcaccca 
acaggaaggc 
atactcttcc 
tacatatttg 



tggtagctct 
gcagcagatt 
gtctgacgct 
aaggatcttc 
aaagtatata 
tctcagcgat 
ctacgatacg 
gctcaccggc 
gtggtcctgc 
taagtagttc 
tgtcacgctc 
ttacatgatc 
tcagaagtaa 
ttactgtcat 
tctgagaata 
ccgcgccaca 
aactctcaag 
actgatcttc 
aaaatgccgc 
tttttcaata 
aatgtattta 



tgatccggca 
acgcgcagaa 
cagtggaacg 
acctagatcc 
tgagtaaact 
ctgtctattt 
ggagggctta 
tccagattta 
aactttatcc 
gccagttaat 
gtcgtttggt 
ccccatgttg 
gttggccgca 
gccatccgta 
gtgtatgcgg 
tagcagaact 
gatcttaccg 
agcatctttt 
aaaaaaggga 
ttattgaagc 
gaaaaataaa 



aacaaaccac 
aaaaaggatc 
aaaactcacg 
ttttaaatta 
tggtctgaca 
cgttcatcca 
ccatctggcc 
tcagcaataa 
gcctccatcc 
agtttgcgca 
atggcttcat 
tgcaaaaaag 
gtgttatcac 
agatgctttt 
cgaccgagtt 
ttaaaagtgc 
ctgttgagat 
actttcacca 
ataagggcga 
atttatcagg 
caaatagggg 



6960 
7020 
7080 
7140 
7200 
7260 
7320 
7380 
7440 
7500 
7560 
7620 
7680 
7740 
7800 
7860 
7920 
7980 
8040 
8100 
8160 
8175 



<210> 6 
<211> 5 
<212> PRT 

<213> Artificial Sequence 
<220> 

<223> GS Linker 



<400> 6 

Gly Gly Gly Gly Ser 
1 5 
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